/* Generated By:JavaCC: Do not edit this line. PageDescription.java */
package net.nutch.quality.dynamic;
import java.io.*;
import java.util.*;
/************************************************
* PageDescription gives the URL and the textual
* description for a target page. It loads in
* a Sherlock plugin file.
*
* @author Mike Cafarella
************************************************/
public class PageDescription implements PageDescriptionConstants {
HashMap values = new HashMap();
ArrayList inputs = new ArrayList();
ArrayList interprets = new ArrayList();
public HashMap getValues() {
return values;
}
public ArrayList getInputs() {
return inputs;
}
public ArrayList getInterprets() {
return interprets;
}
/**
* Test out sherlock parsing
*/
public static void main(String argv[]) throws IOException, ParseException {
if (argv.length < 1) {
System.out.println("Usage: java net.nutch.quality.PageDescription <srcFile>");
return;
}
PageDescription pd = new PageDescription(new FileInputStream(new File(argv[0])));
pd.parse();
}
final public void parse() throws ParseException {
jj_consume_token(10);
label_1:
while (true) {
switch ((jj_ntk==-1)?jj_ntk():jj_ntk) {
case KEYWORD:
;
break;
default:
jj_la1[0] = jj_gen;
break label_1;
}
param();
}
jj_consume_token(11);
label_2:
while (true) {
switch ((jj_ntk==-1)?jj_ntk():jj_ntk) {
case 13:
case 14:
case 15:
;
break;
default:
jj_la1[1] = jj_gen;
break label_2;
}
element();
}
switch ((jj_ntk==-1)?jj_ntk():jj_ntk) {
case 12:
jj_consume_token(12);
break;
default:
jj_la1[2] = jj_gen;
;
}
}
final public void param() throws ParseException {
String keyword;
String value;
jj_consume_token(KEYWORD);
keyword = token.image.toLowerCase();
jj_consume_token(EQUALS);
value = value();
values.put(keyword,value);
}
final public void element() throws ParseException {
HashMap input;
HashMap interpret;
switch ((jj_ntk==-1)?jj_ntk():jj_ntk) {
case 13:
jj_consume_token(13);
input = new HashMap(); inputs.add(input);
label_3:
while (true) {
switch ((jj_ntk==-1)?jj_ntk():jj_ntk) {
case KEYWORD:
;
break;
default:
jj_la1[3] = jj_gen;
break label_3;
}
inputItem(input);
}
break;
case 14:
jj_consume_token(14);
interpret = new HashMap(); interprets.add(interpret);
label_4:
while (true) {
switch ((jj_ntk==-1)?jj_ntk():jj_ntk) {
case KEYWORD:
;
break;
default:
jj_la1[4] = jj_gen;
break label_4;
}
matchItem(interpret);
}
break;
case 15:
jj_consume_token(15);
jj_consume_token(KEYWORD);
label_5:
while (true) {
switch ((jj_ntk==-1)?jj_ntk():jj_ntk) {
case KEYWORD:
;
break;
default:
jj_la1[5] = jj_gen;
break label_5;
}
jj_consume_token(KEYWORD);
switch ((jj_ntk==-1)?jj_ntk():jj_ntk) {
case EQUALS:
jj_consume_token(EQUALS);
value();
break;
default:
jj_la1[6] = jj_gen;
;
}
}
break;
default:
jj_la1[7] = jj_gen;
jj_consume_token(-1);
throw new ParseException();
}
switch ((jj_ntk==-1)?jj_ntk():jj_ntk) {
case 16:
jj_consume_token(16);
break;
case 11:
jj_consume_token(11);
break;
default:
jj_la1[8] = jj_gen;
jj_consume_token(-1);
throw new ParseException();
}
}
final public void inputItem(HashMap input) throws ParseException {
String keyword;
String value = null;
jj_consume_token(KEYWORD);
keyword = token.image.toLowerCase();
switch ((jj_ntk==-1)?jj_ntk():jj_ntk) {
case EQUALS:
jj_consume_token(EQUALS);
value = value();
break;
default:
jj_la1[9] = jj_gen;
;
}
input.put(keyword,value);
}
final public void matchItem(HashMap interpret) throws ParseException {
String keyword;
String value = null;
jj_consume_token(KEYWORD);
keyword = token.image.toLowerCase();
jj_consume_token(EQUALS);
value = value();
interpret.put(keyword,value);
}
final public String value() throws ParseException {
String image;
switch ((jj_ntk==-1)?jj_ntk():jj_ntk) {
case QUOTED_VALUE:
jj_consume_token(QUOTED_VALUE);
image = token.image.substring(1,token.image.length()-1);
break;
case UNQUOTED_VALUE:
jj_consume_token(UNQUOTED_VALUE);
image = token.image;
break;
default:
jj_la1[10] = jj_gen;
jj_consume_token(-1);
throw new ParseException();
}
{if (true) return image;}
throw new Error("Missing return statement in function");
}
public PageDescriptionTokenManager token_source;
SimpleCharStream jj_input_stream;
public Token token, jj_nt;
private int jj_ntk;
private int jj_gen;
final private int[] jj_la1 = new int[11];
final private int[] jj_la1_0 = {0x40,0xe000,0x1000,0x40,0x40,0x40,0x80,0xe000,0x10800,0x80,0x300,};
public PageDescription(java.io.InputStream stream) {
jj_input_stream = new SimpleCharStream(stream, 1, 1);
token_source = new PageDescriptionTokenManager(jj_input_stream);
token = new Token();
jj_ntk = -1;
jj_gen = 0;
for (int i = 0; i < 11; i++) jj_la1[i] = -1;
}
public void ReInit(java.io.InputStream stream) {
jj_input_stream.ReInit(stream, 1, 1);
token_source.ReInit(jj_input_stream);
token = new Token();
jj_ntk = -1;
jj_gen = 0;
for (int i = 0; i < 11; i++) jj_la1[i] = -1;
}
public PageDescription(java.io.Reader stream) {
jj_input_stream = new SimpleCharStream(stream, 1, 1);
token_source = new PageDescriptionTokenManager(jj_input_stream);
token = new Token();
jj_ntk = -1;
jj_gen = 0;
for (int i = 0; i < 11; i++) jj_la1[i] = -1;
}
public void ReInit(java.io.Reader stream) {
jj_input_stream.ReInit(stream, 1, 1);
token_source.ReInit(jj_input_stream);
token = new Token();
jj_ntk = -1;
jj_gen = 0;
for (int i = 0; i < 11; i++) jj_la1[i] = -1;
}
public PageDescription(PageDescriptionTokenManager tm) {
token_source = tm;
token = new Token();
jj_ntk = -1;
jj_gen = 0;
for (int i = 0; i < 11; i++) jj_la1[i] = -1;
}
public void ReInit(PageDescriptionTokenManager tm) {
token_source = tm;
token = new Token();
jj_ntk = -1;
jj_gen = 0;
for (int i = 0; i < 11; i++) jj_la1[i] = -1;
}
final private Token jj_consume_token(int kind) throws ParseException {
Token oldToken;
if ((oldToken = token).next != null) token = token.next;
else token = token.next = token_source.getNextToken();
jj_ntk = -1;
if (token.kind == kind) {
jj_gen++;
return token;
}
token = oldToken;
jj_kind = kind;
throw generateParseException();
}
final public Token getNextToken() {
if (token.next != null) token = token.next;
else token = token.next = token_source.getNextToken();
jj_ntk = -1;
jj_gen++;
return token;
}
final public Token getToken(int index) {
Token t = token;
for (int i = 0; i < index; i++) {
if (t.next != null) t = t.next;
else t = t.next = token_source.getNextToken();
}
return t;
}
final private int jj_ntk() {
if ((jj_nt=token.next) == null)
return (jj_ntk = (token.next=token_source.getNextToken()).kind);
else
return (jj_ntk = jj_nt.kind);
}
private java.util.Vector jj_expentries = new java.util.Vector();
private int[] jj_expentry;
private int jj_kind = -1;
final public ParseException generateParseException() {
jj_expentries.removeAllElements();
boolean[] la1tokens = new boolean[17];
for (int i = 0; i < 17; i++) {
la1tokens[i] = false;
}
if (jj_kind >= 0) {
la1tokens[jj_kind] = true;
jj_kind = -1;
}
for (int i = 0; i < 11; i++) {
if (jj_la1[i] == jj_gen) {
for (int j = 0; j < 32; j++) {
if ((jj_la1_0[i] & (1<<j)) != 0) {
la1tokens[j] = true;
}
}
}
}
for (int i = 0; i < 17; i++) {
if (la1tokens[i]) {
jj_expentry = new int[1];
jj_expentry[0] = i;
jj_expentries.addElement(jj_expentry);
}
}
int[][] exptokseq = new int[jj_expentries.size()][];
for (int i = 0; i < jj_expentries.size(); i++) {
exptokseq[i] = (int[])jj_expentries.elementAt(i);
}
return new ParseException(token, exptokseq, tokenImage);
}
final public void enable_tracing() {
}
final public void disable_tracing() {
}
}